from datasets import load_dataset
import os

# 设置 Hugging Face 镜像站
os.environ["HF_ENDPOINT"] = "https://hf-mirror.com"

# 1. 加载数据集 (现在会从镜像站下载)
dataset = load_dataset("facebook/voxpopuli", "nl", split="train")

# 2. 将数据集保存到本地指定目录
dataset.save_to_disk("./voxpopuli_nl_train")

# hf download facebook/voxpopuli --repo-type dataset --include "data/nl/*" --local-dir data/nl
